import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import math


dataset = pd.read_csv("C:\\Users\\aashi\\anaconda3\\Jupyter Notebooks\\1stop.ai\\Best Ads Predictor\\Ads_CTR_Optimisation.csv")


dataset


dataset.head()


N = 10000 # No. of rows
d = 10 # No. of ads
ads_selected = [] # list of selected ads


# list of selected elements
number_of_selections = [0]*d


# sum of Rewards
sum_of_rewards = [0]*d
total_reward = 0


for n in range(0,N):
    ad = 0
    max_upper_bound = 0
    for i in range(0,d):
        if(number_of_selections[i]>0):
            average_reward = sum_of_rewards[i]/number_of_selections[i]
            delta_i = math.sqrt(3/2*math.log(n+1)/number_of_selections[i])
            upper_bound = average_reward + delta_i
        else:
            upper_bound = 1e400
        if(upper_bound>max_upper_bound):
            max_upper_bound = upper_bound
            ad = i
        ads_selected.append(ad)
        number_of_selections[ad] += 1
        reward = dataset.values[n,ad]
        sum_of_rewards[ad] += reward


plt.hist(ads_selected)
plt.title("Histogram of Ads Selected")
plt.xlabel("Ads")
plt.ylabel("No. of times each Ad was selected")

Text(0, 0.5, 'No. of times each Ad was selected')


import pandas as pd
import matplotlib.pyplot as plt
import random


dataset = pd.read_csv("C:\\Users\\aashi\\anaconda3\\Jupyter Notebooks\\1stop.ai\\Best Ads Predictor\\Ads_CTR_Optimisation.csv")


dataset


dataset.head()


N = 10000 # No. of rows
d = 10 # No. of Ads


ads_selected = []
number_of_rewords_1 = [0] * 10
number_of_rewords_0 = [0] * 10
total_reward = 0


for n in range(0,N):
    ad = 0
    max_random = 0
    for i in range(0, d):
        random_beta = random.betavariate(number_of_rewords_1[i] + 1, number_of_rewords_0[i] + 1)
        if(random_beta > max_random):
            max_random = random_beta
            ad = i
    ads_selected.append(ad)
    reward = dataset.values[n, ad]
    if(reward == 1):
        number_of_rewords_1[ad] += 1
    else:
        number_of_rewords_0[ad] += 1
    total_reward += reward


plt.hist(ads_selected)
plt.title("Histogram for Selected Ads")
plt.xlabel("Ads")
plt.ylabel("No. of times the Ad was selected")

Text(0, 0.5, 'No. of times the Ad was selected')

UCB	Thompson Sampling
It is the Deterministic Approach.	It is the Probabilistic Approach.
It required Updation in each round.	It can have a delayed feedback.
We do not have a better empirical evidence for this.	We have a better empirical evidence for this.

	Ad 1	Ad 2	Ad 3	Ad 4	Ad 5	Ad 6	Ad 7	Ad 8	Ad 9	Ad 10
0	1	0	0	0	1	0	0	0	1	0
1	0	0	0	0	0	0	0	0	1	0
2	0	0	0	0	0	0	0	0	0	0
3	0	1	0	0	0	0	0	1	0	0
4	0	0	0	0	0	0	0	0	0	0
...	...	...	...	...	...	...	...	...	...	...
9995	0	0	1	0	0	0	0	1	0	0
9996	0	0	0	0	0	0	0	0	0	0
9997	0	0	0	0	0	0	0	0	0	0
9998	1	0	0	0	0	0	0	1	0	0
9999	0	1	0	0	0	0	0	0	0	0

	Ad 1	Ad 2	Ad 5	Ad 8	Ad 9
0	1	0	1	0	1
1	0	0	0	0	1
2	0	0	0	0	0
3	0	1	0	1	0
4	0	0	0	0	0

	Ad 1	Ad 2	Ad 3	Ad 4	Ad 5	Ad 6	Ad 7	Ad 8	Ad 9	Ad 10
0	1	0	0	0	1	0	0	0	1	0
1	0	0	0	0	0	0	0	0	1	0
2	0	0	0	0	0	0	0	0	0	0
3	0	1	0	0	0	0	0	1	0	0
4	0	0	0	0	0	0	0	0	0	0
...	...	...	...	...	...	...	...	...	...	...
9995	0	0	1	0	0	0	0	1	0	0
9996	0	0	0	0	0	0	0	0	0	0
9997	0	0	0	0	0	0	0	0	0	0
9998	1	0	0	0	0	0	0	1	0	0
9999	0	1	0	0	0	0	0	0	0	0

	Ad 1	Ad 2	Ad 5	Ad 8	Ad 9
0	1	0	1	0	1
1	0	0	0	0	1
2	0	0	0	0	0
3	0	1	0	1	0
4	0	0	0	0	0

Method 1 - Using Upper Confidence Bound¶

Importing Libraries¶

Importing Dataset¶

Implementing UCB¶

Visualising the Results¶

Method 2 - Using Thompson Sampling¶

Importing Libraries¶

Import Dataset¶

Implementation of Thompson Sampling¶

Visualising the Result¶